{
    "model_path": "/data/feng/hf-models/Llama-2-7b-chat-hf",
    "model_type": "causal",
    "model_id": "llama-2-7b-chat-e5-large-v2-pretrain-ml=40",
    "reencoder": "intfloat/e5-large-v2",
    "max_input_length": 512,
    "dtype": "bfloat16",
    "seed": 42,
    "use_flash_attention_2": true,
    "generation_configs": {
        "temperature": 0.6,
        "top_p": 0.9,
        "max_new_tokens": 40,
        "do_sample": true
    },
    "batch_size": 50,
    "disable_instruction": false,
    "pattern": "[INST] Your task is to give an answer according to the instruction and input. Please keep your answer short.\n\nInput: {input}\n\nInstruction: {instruction}\n\n### Your Answer: [/INST]"
}